import pandas as pd
qa_df = pd.read_parquet(r'D:\laern_langchain\bjq1021\content\eli5_data\qa_sample.parquet')
print(f"原始数据总共有 {len(qa_df)} 条记录")